Document description:

This notebook contains code to process raw data provided for CEGE0042 final assignment. It covers:

  1. Project set up

  2. Area selection (Islington)

  3. Data sub-selection for further analysis

1. Project set up:

#Packages
library(sf)
Linking to GEOS 3.5.1, GDAL 2.2.2, PROJ 4.9.2
library(sp)
library(tmap)
Registered S3 methods overwritten by 'htmltools':
  method               from         
  print.html           tools:rstudio
  print.shiny.tag      tools:rstudio
  print.shiny.tag.list tools:rstudio
Registered S3 method overwritten by 'htmlwidgets':
  method           from         
  print.htmlwidget tools:rstudio
replacing previous import ‘sf::st_make_valid’ by ‘lwgeom::st_make_valid’ when loading ‘tmap’
#Working directory definition
#getwd()

#Load data
cege_data <- "./0_source_data/UJTWorkSpace.RData"
load(cege_data)

2. Area selection (Islington)

Select area(s)

# get all links that are totally within a given borough
LCAPShp_sf_sub <- LCAPShp_sf[st_within(LCAPShp_sf, 
                              LondonBor[LondonBor$NAME == "Islington",], 
                              sparse = FALSE),]
although coordinates are longitude/latitude, st_within assumes that they are planar
# check number of links in the subset
link_list <- LCAPShp_sf_sub$LCAP_ID

length(link_list)
[1] 31
# export list of links
print(link_list)
 [1] 2464  418 1807 1810 1607 1321 1632 1444 1445 1626 1426 1430 2054 2055 2420 2421 2422 2423
[19] 2058 2061 2126 2425 2428  448  450  583  481  589 2429  650  692
write.csv(x = link_list,"./2_data_split/selected_links.csv")

3. Data sub-selection for further analysis

3.1 UJT table

UJT table - each link (column) across time (row)

# Export all source data into python friendly .csv files

# Take selected links and export selections of source data

# select relevant columns

counter = 0
link_list_string <- c()

for (entry in link_list) {
  #print(entry)
  counter <- counter + 1
  temp_string <- toString(entry)
  link_list_string[[counter]] <- temp_string
}
link_list
link_list_string

sort(colnames(UJT))

UJT[,c("2464")]
LS0tCnRpdGxlOiAiQ0VHRTAwNDIgQXNzaWdubWVudCAtIGRhdGEgcHJlcCIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKIyMjIERvY3VtZW50IGRlc2NyaXB0aW9uOgpUaGlzIG5vdGVib29rIGNvbnRhaW5zIGNvZGUgdG8gcHJvY2VzcyByYXcgZGF0YSBwcm92aWRlZCBmb3IgQ0VHRTAwNDIgZmluYWwgYXNzaWdubWVudC4KSXQgY292ZXJzOjxicj4KCjEuIFByb2plY3Qgc2V0IHVwCgoyLiBBcmVhIHNlbGVjdGlvbiAoSXNsaW5ndG9uKQoKMy4gRGF0YSBzdWItc2VsZWN0aW9uIGZvciBmdXJ0aGVyIGFuYWx5c2lzCgoKIyMjIDEuIFByb2plY3Qgc2V0IHVwOgoKYGBge3J9CiNQYWNrYWdlcwpsaWJyYXJ5KHNmKQpsaWJyYXJ5KHNwKQpsaWJyYXJ5KHRtYXApCgojV29ya2luZyBkaXJlY3RvcnkgZGVmaW5pdGlvbgojZ2V0d2QoKQoKI0xvYWQgZGF0YQpjZWdlX2RhdGEgPC0gIi4vMF9zb3VyY2VfZGF0YS9VSlRXb3JrU3BhY2UuUkRhdGEiCmxvYWQoY2VnZV9kYXRhKQpgYGAKCgojIyMgMi4gQXJlYSBzZWxlY3Rpb24gKElzbGluZ3RvbikKCiMjIyMgRmxhZyBsaW5rcyB3aXRoIGRhdGEKYGBge3J9CiNJbiBVSlQgdGhlcmUgYXJlIDI1NiBsaW5rIGlkcyB3aXRoIGRhdGEKYWxsX1VKVF9saW5rcyA8LSBjb2xuYW1lcyhVSlQpCmxlbmd0aChhbGxfVUpUX2xpbmtzKQoKI0luIG91ciBzaGFwZSBmaWxlLCB0aGVyZSBhcmUgMTQwMiBsaW5rIGlkcwpsZW5ndGgoTENBUFNocCRMQ0FQX0lEKQoKI0ZsYWcgd2hpY2ggbGlua3MgaW4gc2hhcGUgZmlsZSB3ZSBoYXZlIGRhdGEgZm9yCkxDQVBTaHAkSGF2ZURhdGFGbGFnIDwtIDAKCmNvdW50ZXIgPC0gMApmb3IgKG1hc3Rlcl9saW5rX3ZhbHVlIGluIExDQVBTaHAkTENBUF9JRCkgewogIGNvdW50ZXIgPC0gY291bnRlciArIDEKICAKICBpZiAobWFzdGVyX2xpbmtfdmFsdWUgJWluJSBhbGxfVUpUX2xpbmtzKSB7CiAgICBMQ0FQU2hwJEhhdmVEYXRhRmxhZ1tjb3VudGVyXSA8LSAxCiAgfQogIGVsc2V7CiAgICBMQ0FQU2hwJEhhdmVEYXRhRmxhZ1tjb3VudGVyXSA8LSAwCiAgfQogIAp9CgojQ2hlY2sgdGhhdCBzdW0gaXMgZXF1YWwgdG8gYWxsIGxpbmtzIHdlIGhhdmUgZGF0YSBmb3IKc3VtKExDQVBTaHAkSGF2ZURhdGFGbGFnKQpgYGAKCiMjIyMgU3ViLXNlbGVjdCBsaW5rcyAodmlzdWFsaXNlIGRhdGEgYXZhaWxhYmxpdHkpCmBgYHtyfQojIExpbmsgc2hwIGZpbGUgdG8gdG8gc2Ygb2JqZWN0CkxDQVBTaHBfc2YgPC0gc3RfYXNfc2YoTENBUFNocCkKCiMgVmlzdWFsaXNlIGZpZWxkIHRvIHNob3cgbGlua3Mgd2l0aCBzcGVlZCBkYXRhCiNwbG90KExDQVBTaHBfc2ZbIkhhdmVEYXRhRmxhZyJdKQoKIyBMb2FkIHJlZmVyZW5jZSBzaGFwZSBmaWxlIGZvciBMb25kb24gQm9yb3VnaAojIHJlYWQgaW4gcG9seWdvbiBzaHAgYW5kIHNldCBjcnMgdG8gbWF0Y2ggCkxvbmRvbkJvciA8LSBzdF9yZWFkKCcuLzFfc2hhcGVfZmlsZXMvc2hhcGVmaWxlcy9Mb25kb25fQm9yb3VnaF9FeGNsdWRpbmdfTUhXLnNocCcpICU+JQogIHN0X3RyYW5zZm9ybShMb25kb25Cb3IsIGNycyA9IHN0X2NycyhMQ0FQU2hwX3NmKSkKCiMgZm9yIGludGVyYWN0aXZlIHZpZXdpbmcgCnRtYXBfbW9kZSgidmlldyIpCgojIGxheWVyIHRoZSBib3JvdWdocywgYWxsIGxpbmtzLCBhbmQgc2VsZWN0ZWQgbGlua3MgCnRtX3NoYXBlKExvbmRvbkJvcikrCiAgdG1fcG9seWdvbnMoY29sPSd3aGl0ZScpKwogIHRtX3NoYXBlKExDQVBTaHBfc2YpKwogIHRtX2xpbmVzKGNvbD0nbGlnaHRncmVlbicpKwogIHRtX3NoYXBlKExDQVBTaHBfc2ZbIkxDQVBfSUQiXSkrCiAgdG1fbGluZXMoY29sID0gIkxDQVBfSUQiKQoKI0xDQVBfSUQKI0hhdmVEYXRhRmxhZwpgYGAKCiMjIyMgU2VsZWN0IGFyZWEocykKYGBge3J9CiMgZ2V0IGFsbCBsaW5rcyB0aGF0IGFyZSB0b3RhbGx5IHdpdGhpbiBhIGdpdmVuIGJvcm91Z2gKTENBUFNocF9zZl9zdWIgPC0gTENBUFNocF9zZltzdF93aXRoaW4oTENBUFNocF9zZiwgCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIExvbmRvbkJvcltMb25kb25Cb3IkTkFNRSA9PSAiSXNsaW5ndG9uIixdLCAKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgc3BhcnNlID0gRkFMU0UpLF0KCiMgY2hlY2sgbnVtYmVyIG9mIGxpbmtzIGluIHRoZSBzdWJzZXQKbGlua19saXN0IDwtIExDQVBTaHBfc2Zfc3ViJExDQVBfSUQKCmxlbmd0aChsaW5rX2xpc3QpCiMgZXhwb3J0IGxpc3Qgb2YgbGlua3MKcHJpbnQobGlua19saXN0KQp3cml0ZS5jc3YoeCA9IGxpbmtfbGlzdCwiLi8yX2RhdGFfc3BsaXQvc2VsZWN0ZWRfbGlua3MuY3N2IikKYGBgCgojIyMjIHZpc3VhbGlzZSBsaW5rcwpgYGB7cn0KIyBwbG90IHRvIHRha2UgYSBsb29rCnBsb3QoTENBUFNocF9zZl9zdWIpCgojIGZvciBpbnRlcmFjdGl2ZSB2aWV3aW5nIAp0bWFwX21vZGUoInZpZXciKQoKIyBsYXllciB0aGUgYm9yb3VnaHMsIGFsbCBsaW5rcywgYW5kIHNlbGVjdGVkIGxpbmtzIAp0bV9zaGFwZShMb25kb25Cb3IpKwogIHRtX3BvbHlnb25zKGNvbD0nd2hpdGUnKSsKICB0bV9zaGFwZShMQ0FQU2hwX3NmKSsKICB0bV9saW5lcyhjb2w9J2xpZ2h0Z3JlZW4nKSsKICB0bV9zaGFwZShMQ0FQU2hwX3NmX3N1YikrCiAgdG1fbGluZXMoY29sPSdyZWQnKQpgYGAKCgojIyMgMy4gRGF0YSBzdWItc2VsZWN0aW9uIGZvciBmdXJ0aGVyIGFuYWx5c2lzCgojIyMjIDMuMSBVSlQgdGFibGUKVUpUIHRhYmxlIC0gZWFjaCBsaW5rIChjb2x1bW4pIGFjcm9zcyB0aW1lIChyb3cpCmBgYHtyfQojIEV4cG9ydCBhbGwgc291cmNlIGRhdGEgaW50byBweXRob24gZnJpZW5kbHkgLmNzdiBmaWxlcwoKIyBUYWtlIHNlbGVjdGVkIGxpbmtzIGFuZCBleHBvcnQgc2VsZWN0aW9ucyBvZiBzb3VyY2UgZGF0YQoKIyBzZWxlY3QgcmVsZXZhbnQgY29sdW1ucwoKY291bnRlciA9IDAKbGlua19saXN0X3N0cmluZyA8LSBjKCkKCmZvciAoZW50cnkgaW4gbGlua19saXN0KSB7CiAgI3ByaW50KGVudHJ5KQogIGNvdW50ZXIgPC0gY291bnRlciArIDEKICB0ZW1wX3N0cmluZyA8LSB0b1N0cmluZyhlbnRyeSkKICBsaW5rX2xpc3Rfc3RyaW5nW1tjb3VudGVyXV0gPC0gdGVtcF9zdHJpbmcKfQpsaW5rX2xpc3QKbGlua19saXN0X3N0cmluZwoKc29ydChjb2xuYW1lcyhVSlQpKQoKVUpUWyxjKCIyNDY0IildCgoKYGBgCgoKCgo=